rm(list = ls())
load("dataBJPOLS_incl_out.RData")

inst.1 <- "judgeiv_hd * as.factor(keep)"
endo.1 <- "pti * as.factor(keep)"
outc.1 <- "vote_post"

time.controls <- "as.factor(court_time1) + as.factor(court_time2) + as.factor(court_dow) + as.factor(severity)"
demo.controls <- "age + I(age^2) +  as.factor(race4) + female + vote_pre + as.factor(noteli) + regis_before"
case.controls <- "as.factor(any_drug) +  as.factor(any_weapon) +  as.factor(any_prop) + as.factor(any_prior_case)"

form.1 <- formula(paste(outc.1, "~", endo.1, "+" , time.controls, "|", inst.1, "+", time.controls))
form.2 <- formula(paste(outc.1, "~", endo.1, "+" , time.controls, "+", demo.controls, "|", inst.1, "+", time.controls, "+", demo.controls))
form.3 <- formula(paste(outc.1, "~", endo.1, "+" , time.controls, "+", demo.controls, "+", case.controls, "|", inst.1, "+", time.controls, "+", demo.controls, "+", case.controls))

results <- resultsO <- list()
run.boot <- T

if(run.boot) {
  set.seed(1231)
  for(i in 1:500) {
    
    out <- last.cases[, this_id_fa[sample.int(.N, .N, TRUE)], by = c("judge_cat", "court_time1")]
    last.cases.boot <- last.cases[last.cases$this_id_fa %in% out$V1, ]
    
    m1a1 <- ivreg(form.1, data = last.cases.boot)
    m1a2 <- ivreg(form.2, data = last.cases.boot)
    m1a3 <- ivreg(form.3, data = last.cases.boot)
    
    results[[i]] <- c(m1a1$coefficients["pti"], 
                      m1a2$coefficients["pti"], 
                      m1a3$coefficients["pti"])
    resultsO[[i]] <- c(m1a1$coefficients["pti:as.factor(keep)1"], 
                      m1a2$coefficients["pti:as.factor(keep)1"], 
                      m1a3$coefficients["pti:as.factor(keep)1"])
  }
  
  SEs <- round(apply(do.call('rbind', results), 2, sd), 2)
  SEsO <- round(apply(do.call('rbind', resultsO), 2, sd), 2)
 }

m1a1 <- ivreg(form.1, data = last.cases)
m1a2 <- ivreg(form.2, data = last.cases)
m1a3 <- ivreg(form.3, data = last.cases)

res1_pti <- coefficients(m1a1)[grep("pti", names(coefficients(m1a1)))]
res2_pti <- coefficients(m1a2)[grep("pti", names(coefficients(m1a2)))]
res3_pti <- coefficients(m1a3)[grep("pti", names(coefficients(m1a3)))]

m1a1_d <- summary(m1a1, vcov = sandwich, diagnostic = T)
m1a2_d <- summary(m1a2, vcov = sandwich, diagnostic = T)
m1a3_d <- summary(m1a3, vcov = sandwich, diagnostic = T)

m1a1_d1 <- m1a1_d$diagnostics[grep("Weak", rownames(m1a1_d$diagnostics)), 3]
m1a2_d1 <- m1a2_d$diagnostics[grep("Weak", rownames(m1a2_d$diagnostics)), 3]
m1a3_d1 <- m1a3_d$diagnostics[grep("Weak", rownames(m1a3_d$diagnostics)), 3]

p1 <- data.table(cbind(res1_pti, res2_pti, res3_pti))
p1$V4 <- 1
p1$V5 <- 1:nrow(p1)
p1$V6 <- "Estimate"
colnames(p1) <- paste0("V", 1:6)

p2 <- data.table(t(cbind(c(SEs[1], SEs[2], SEs[3]),
                       c(SEsO[1], SEsO[2], SEsO[3]))))
p2$V4 <- 2
p2$V5 <- 1:nrow(p2)
p2$V6 <- "Std. Error"
colnames(p2) <- paste0("V", 1:6)

p3 <- data.table(round(cbind(m1a1_d1, m1a2_d1, m1a3_d1), 2))
colnames(p3) <- c("V1", "V2", "V3")
p3$V4 <- 3
p3$V5 <- 1:nrow(p3)
p3$V6 <- "F-stat"

table <- rbind(p1, p2, p3)
table <- table[order(V5, V4), ]
table$V4 <- table$V5 <- NULL
p4 <- data.table(m1a1$nobs, m1a2$nobs, m1a3$nobs)    
p4$V6 <- "N"

table <- rbind(table, p4)
table <- table[, c("V6", "V1", "V2", "V3")]
colnames(table) <- c("Variable", "Model 1", "Model 2", "Model 3")
table




